import whisper

whisper_model = whisper.load_model("large")
result = whisper_model.transcribe(r"C:\Users\Administrator\Documents\WeChat "
                                  r"Files\wxid_a8ll54i2gfk012\FileStorage\File\2023-09\测试文件（英）.wav")
print(", ".join([i["text"] for i in result["segments"] if i is not None]))
